library(tidyverse)
library(plotly)

plotly vs ggplot2

mpg %>%
  ggplot(aes(displ, hwy, color = factor(cyl))) + geom_point() +
  guides(color = guide_legend("cyl"))

mpg %>% 
  plot_ly(x = ~displ, y = ~hwy, color =  ~factor(cyl))

Cons: - Interactive - Plotly handles multiple wide data columns (ggplot2 requies long format) - Plotly works for Python, Matlab, and Excel, among other languages - Easy layout customization - 3D charts

Pros: - Doesn’t work very well with pdf - Facet wrapping is a bit complicated compared with ggplot2 - adding legend title is difficult

ggplot(mpg, aes(displ, hwy)) + 
  geom_point(data = mutate(mpg, cyl = NULL), color = "grey75") +
  geom_point() +
  facet_wrap(vars(cyl))

ggplotly function for ggplot2 users

p <- mpg %>%
  mutate(cyl = as_factor(cyl)) %>%
  ggplot(aes(displ, hwy, color = cyl)) + geom_point()
ggplotly(p)

We won’t learn (much of)

  • ggplot2 (or should we?)

  • HTML, SVG, CSS, JavaScript

  • d3.js (R package r2d3)

Scatter plots + lines

p <- economics %>%
  sample_n(n()) %>%
  plot_ly(x = ~date, y = ~psavert)
p %>% add_paths()  # using the order of the data frame 
p %>% add_lines() 
library(lubridate)
## 
## Attaching package: 'lubridate'
## The following object is masked from 'package:base':
## 
##     date
econ <- economics %>%
  mutate(yr = year(date), mnth = month(date))

# One trace (more performant, but less interactive)
econ %>%
  group_by(yr) %>%
  plot_ly(x = ~mnth, y = ~uempmed) %>%
  add_lines(text = ~yr)
# Multiple traces (less performant, but more interactive)
plot_ly(econ, x = ~mnth, y = ~uempmed) %>%
  add_lines(color = ~ordered(yr))

Use Canvas rather then SVG for large dataset

plot_ly(econ, x = ~mnth, y = ~uempmed) %>%
  add_lines(color = ~ordered(yr)) %>%
  toWebGL()

Markers

  • alpha blending to see replicates
mpg %>% 
  plot_ly(x = ~cty, y = ~hwy) %>% 
  add_markers(alpha = 0.2)
  • colors for grouping
mtcars %>% 
  plot_ly(x = ~disp, y = ~mpg) %>% 
  add_markers(color = ~factor(cyl))
  • symbols
mtcars %>% 
  plot_ly(x = ~disp, y = ~mpg) %>% 
  add_markers(symbol = ~factor(cyl))

Error bar plot

mpg %>% 
  group_by(cyl) %>%
  summarize(mhwy = mean(hwy), se = sd(hwy)/sqrt(n())) %>%
  plot_ly(x = ~mhwy, y = ~factor(cyl)) %>%
  add_markers(error_x = ~list(value = se)) %>%
  layout(xaxis = list(title = "mean hwy"), yaxis = list(title = "cyl"))

Segments

mpg %>%
  group_by(model) %>%
  summarize(c = mean(cty), h = mean(hwy)) %>%
  mutate(model = forcats::fct_reorder(model, c)) %>%
  plot_ly() %>%
  add_segments(
    x = ~c, y = ~model,
    xend = ~h, yend = ~model, 
    color = I("gray"), showlegend = FALSE
  ) %>%
  add_markers(
    x = ~c, y = ~model, 
    color = I("blue"), 
    name = "mpg city"
  ) %>%
  add_markers(
    x = ~h, y = ~model, 
    color = I("red"),
    name  = "mpg highway"
  ) %>%
  layout(xaxis = list(title = "Miles per gallon"))

Histograms

mpg %>%
  plot_ly(x= ~hwy, color = ~factor(cyl)) %>% 
  add_histogram(histnorm = "", alpha = 0.7) %>%  # histnorm could be "", "probability", "density" and "probability density"
  layout(barmode = "overlay")  # barmode could be "overlay", "stack" and "group"
# work with wide format directly
relig_income %>% 
  mutate(religion = as_factor(religion)) %>%
  plot_ly(y = ~religion) %>% 
  add_bars(~`$10-20k`, name = "$10-20k") %>%
  add_bars(~`$50-75k`, name = "$50-75k") %>%  
  layout(xaxis = list(title = "income"))

Bar plots

mpg %>%
  mutate(cyl = as_factor(cyl)) %>% 
  count(drv, cyl) %>%
  plot_ly(x = ~drv, y = ~n, color = ~cyl) %>% 
  add_bars() %>% 
  layout(barmode = "stack")

Box plots

mpg %>%
  mutate(cyl = as_factor(cyl)) %>% 
  plot_ly(x = ~drv, y = ~hwy, color = ~cyl) %>% 
  add_boxplot() %>% 
  layout(boxmode = "group")
## Warning: 'layout' objects don't have these attributes: 'boxmode'
## Valid attributes include:
## 'font', 'title', 'autosize', 'width', 'height', 'margin', 'paper_bgcolor', 'plot_bgcolor', 'separators', 'hidesources', 'showlegend', 'colorway', 'datarevision', 'uirevision', 'editrevision', 'selectionrevision', 'template', 'modebar', 'meta', 'transition', '_deprecated', 'clickmode', 'dragmode', 'hovermode', 'hoverdistance', 'spikedistance', 'hoverlabel', 'selectdirection', 'grid', 'calendar', 'xaxis', 'yaxis', 'ternary', 'scene', 'geo', 'mapbox', 'polar', 'radialaxis', 'angularaxis', 'direction', 'orientation', 'editType', 'legend', 'annotations', 'shapes', 'images', 'updatemenus', 'sliders', 'colorscale', 'coloraxis', 'metasrc', 'barmode', 'bargap', 'mapType'

3D charts

mpg %>%
  mutate(cyl = as_factor(cyl)) %>%
  plot_ly(x = ~cty, y = ~hwy, z = ~cyl) %>%
  add_markers(color = ~cyl)
x <- seq_len(nrow(volcano)) + 100
y <- seq_len(ncol(volcano)) + 500
plot_ly() %>% add_surface(x = ~x, y = ~y, z = ~volcano, colorscale = "Earth")
# heatmap
plot_ly() %>% add_heatmap(x = ~x, y = ~y, z = ~volcano, colorscale = "Earth")

Arranging views

Animating views

References